; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=x86_64-apple-macosx10.15 | FileCheck %s

%0 = type <{ half }>
%1 = type <{ <16 x half> }>

define void @foo(ptr %0, ptr %1, ptr %2) #0 {
; CHECK-LABEL: foo:
; CHECK:       ## %bb.0:
; CHECK-NEXT:    pushq %rbp
; CHECK-NEXT:    movq %rsp, %rbp
; CHECK-NEXT:    andq $-32, %rsp
; CHECK-NEXT:    subq $64, %rsp
; CHECK-NEXT:    movl (%rdx), %eax
; CHECK-NEXT:    andl $15, %eax
; CHECK-NEXT:    vpinsrw $0, (%rdi), %xmm0, %xmm0
; CHECK-NEXT:    vmovups (%rsi), %ymm1
; CHECK-NEXT:    vmovaps %ymm1, (%rsp)
; CHECK-NEXT:    vpextrw $0, %xmm0, (%rsp,%rax,2)
; CHECK-NEXT:    vmovaps (%rsp), %ymm0
; CHECK-NEXT:    vmovups %ymm0, (%rsi)
; CHECK-NEXT:    movq %rbp, %rsp
; CHECK-NEXT:    popq %rbp
; CHECK-NEXT:    vzeroupper
; CHECK-NEXT:    retq
  %4 = bitcast ptr %2 to ptr
  %5 = load i64, ptr %4, align 8
  %6 = getelementptr inbounds %0, ptr %0, i64 0, i32 0
  %7 = load half, ptr %6, align 2
  %8 = getelementptr inbounds %1, ptr %1, i64 0, i32 0
  %9 = load <16 x half>, ptr %8, align 16
  %10 = trunc i64 %5 to i32
  %11 = insertelement <16 x half> %9, half %7, i32 %10
  store <16 x half> %11, ptr %8, align 16
  ret void
}

attributes #0 = { nounwind "target-features"="+f16c" }
